See sóc on Wiktionary
{ "head_templates": [ { "args": { "1": "ca", "2": "verb form" }, "expansion": "sóc", "name": "head" } ], "lang": "Catalan", "lang_code": "ca", "pos": "verb", "senses": [ { "categories": [ { "kind": "other", "name": "Catalan entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w" }, { "kind": "other", "name": "Catalan pre-2016 spellings", "parents": [], "source": "w" }, { "kind": "other", "name": "Catalan words affected by 2016 spelling reform", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with 2 entries", "parents": [], "source": "w" }, { "kind": "other", "name": "Pages with entries", "parents": [], "source": "w" }, { "_dis": "52 4 9 31 5", "kind": "other", "name": "Pages with 2 entries", "parents": [], "source": "w+disamb" }, { "_dis": "46 3 7 41 4", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" } ], "glosses": [ "Pre-2016 spelling of soc (first singular present indicative of ser and ésser)." ], "id": "en-sóc-ca-verb-OU06w~L5", "links": [ [ "soc", "soc#Catalan" ], [ "ser", "ser#Catalan" ], [ "ésser", "ésser#Catalan" ] ] } ], "sounds": [ { "ipa": "[ˈsok]", "tags": [ "Balearic", "Central", "Valencia" ] } ], "word": "sóc" } { "etymology_number": 1, "etymology_templates": [ { "args": { "1": "vi", "2": "mkh-vie-pro", "3": "*prɔːk" }, "expansion": "Proto-Vietic *prɔːk", "name": "inh" }, { "args": { "1": "vi", "2": "mkh-pro", "3": "*prɔɔk" }, "expansion": "Proto-Mon-Khmer *prɔɔk", "name": "inh" }, { "args": { "1": "km", "2": "កំប្រុក" }, "expansion": "Khmer កំប្រុក (kɑmprok)", "name": "cog" }, { "args": { "1": "bdq", "2": "prok" }, "expansion": "Bahnar prok", "name": "cog" }, { "args": { "1": "kjg", "2": "-" }, "expansion": "Khmu", "name": "cog" } ], "etymology_text": "From Proto-Vietic *prɔːk, from Proto-Mon-Khmer *prɔɔk. Cognate with Khmer កំប្រុក (kɑmprok), Bahnar prok, Khmu [Cuang] pʰrɔːk.\nAttested as sóc in the Dictionarium Annamiticum Lusitanum et Latinum (1651).", "forms": [ { "form": "con", "tags": [ "classifier" ] }, { "form": "𱮗", "tags": [ "CJK" ] }, { "form": "朔", "tags": [ "CJK" ] } ], "head_templates": [ { "args": { "1": "vi", "2": "noun", "3": "", "4": "", "head": "", "tr": "𱮗, 朔" }, "expansion": "sóc • (𱮗, 朔)", "name": "head" }, { "args": { "1": "𱮗, 朔", "cls": "con" }, "expansion": "(classifier con) sóc • (𱮗, 朔)", "name": "vi-noun" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "noun", "senses": [ { "categories": [ { "kind": "other", "name": "Vietnamese nouns classified by con", "parents": [], "source": "w+disamb" }, { "_dis": "53 10 31 7", "kind": "lifeform", "langcode": "vi", "name": "Squirrels", "orig": "vi:Squirrels", "parents": [ "Rodents", "Mammals", "Vertebrates", "Chordates", "Animals", "Lifeforms", "All topics", "Life", "Fundamental", "Nature" ], "source": "w+disamb" } ], "derived": [ { "word": "sóc chuột" } ], "glosses": [ "squirrel (rodent)" ], "id": "en-sóc-vi-noun-~zdEJq~t", "links": [ [ "squirrel", "squirrel" ] ] } ], "sounds": [ { "ipa": "[sawk͡p̚˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[ʂawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[sawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[ʂawk͡p̚˦˥]", "note": "Saigon" }, { "ipa": "[sawk͡p̚˦˥]", "note": "Saigon" } ], "word": "sóc" } { "etymology_number": 2, "forms": [ { "form": "朔", "tags": [ "CJK" ] } ], "head_templates": [ { "args": { "1": "vi", "2": "verb", "3": "", "4": "", "head": "", "tr": "朔" }, "expansion": "sóc • (朔)", "name": "head" }, { "args": { "1": "朔" }, "expansion": "sóc • (朔)", "name": "vi-verb" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "verb", "senses": [ { "categories": [ { "_dis": "46 3 7 41 4", "kind": "other", "name": "Pages with entries", "parents": [], "source": "w+disamb" }, { "_dis": "7 31 58 4", "kind": "other", "name": "Vietnamese entries with incorrect language header", "parents": [ "Entries with incorrect language header", "Entry maintenance" ], "source": "w+disamb" } ], "derived": [ { "word": "chăm sóc" }, { "word": "coi sóc" }, { "word": "săn sóc" } ], "glosses": [ "to take care of, to look after" ], "id": "en-sóc-vi-verb-XqGlwI9j", "links": [ [ "take care", "take care" ], [ "look after", "look after" ] ], "raw_glosses": [ "(only in compounds) to take care of, to look after" ], "tags": [ "in-compounds" ] } ], "sounds": [ { "ipa": "[sawk͡p̚˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[ʂawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[sawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[ʂawk͡p̚˦˥]", "note": "Saigon" }, { "ipa": "[sawk͡p̚˦˥]", "note": "Saigon" } ], "word": "sóc" } { "etymology_number": 3, "etymology_templates": [ { "args": { "1": "vi", "2": "km", "3": "ស្រុក" }, "expansion": "Khmer ស្រុក (srok)", "name": "bor" } ], "etymology_text": "From Khmer ស្រុក (srok).", "head_templates": [ { "args": { "1": "vi", "2": "noun", "3": "", "4": "", "head": "", "tr": "" }, "expansion": "sóc", "name": "head" }, { "args": {}, "expansion": "sóc", "name": "vi-noun" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "noun", "senses": [ { "categories": [ { "_dis": "14 14 46 15 10", "kind": "other", "name": "Sino-Vietnamese words", "parents": [], "source": "w+disamb" }, { "_dis": "5 53 35 7", "kind": "place", "langcode": "vi", "name": "Villages", "orig": "vi:Villages", "parents": [ "Polities", "Places", "Names", "All topics", "Proper nouns", "Terms by semantic function", "Fundamental", "Nouns", "Lemmas" ], "source": "w+disamb" } ], "derived": [ { "word": "Sóc Trăng" } ], "glosses": [ "small Khmer village" ], "id": "en-sóc-vi-noun-Rc0E7m5P", "links": [ [ "small", "small" ], [ "Khmer", "Khmer" ], [ "village", "village" ] ] } ], "sounds": [ { "ipa": "[sawk͡p̚˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[ʂawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[sawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[ʂawk͡p̚˦˥]", "note": "Saigon" }, { "ipa": "[sawk͡p̚˦˥]", "note": "Saigon" } ], "word": "sóc" } { "etymology_number": 4, "etymology_templates": [ { "args": { "1": "vi", "2": "朔" }, "expansion": "", "name": "etymid" }, { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "朔" }, "expansion": "Sino-Vietnamese word from 朔", "name": "vi-etym-sino" } ], "etymology_text": "Sino-Vietnamese word from 朔.", "head_templates": [ { "args": { "1": "vi", "2": "noun", "3": "", "4": "", "head": "", "tr": "" }, "expansion": "sóc", "name": "head" }, { "args": {}, "expansion": "sóc", "name": "vi-noun" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "verb", "senses": [ { "categories": [ { "_dis": "4 5 14 76", "kind": "topical", "langcode": "vi", "name": "Calendar", "orig": "vi:Calendar", "parents": [ "Timekeeping", "Time", "All topics", "Fundamental" ], "source": "w+disamb" } ], "derived": [ { "word": "ngày sóc" } ], "glosses": [ "first day of the lunar month" ], "id": "en-sóc-vi-verb-rSI44Tc4", "links": [ [ "first", "first" ], [ "day", "day" ], [ "lunar month", "lunar month" ] ] } ], "sounds": [ { "ipa": "[sawk͡p̚˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[ʂawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[sawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[ʂawk͡p̚˦˥]", "note": "Saigon" }, { "ipa": "[sawk͡p̚˦˥]", "note": "Saigon" } ], "word": "sóc" }
{ "categories": [ "Pages with 2 entries", "Pages with entries", "Sino-Vietnamese words", "vi:Calendar", "vi:Squirrels", "vi:Villages" ], "head_templates": [ { "args": { "1": "ca", "2": "verb form" }, "expansion": "sóc", "name": "head" } ], "lang": "Catalan", "lang_code": "ca", "pos": "verb", "senses": [ { "categories": [ "Catalan entries with incorrect language header", "Catalan non-lemma forms", "Catalan pre-2016 spellings", "Catalan superseded forms", "Catalan terms with IPA pronunciation", "Catalan verb forms", "Catalan words affected by 2016 spelling reform", "Pages with 2 entries", "Pages with entries" ], "glosses": [ "Pre-2016 spelling of soc (first singular present indicative of ser and ésser)." ], "links": [ [ "soc", "soc#Catalan" ], [ "ser", "ser#Catalan" ], [ "ésser", "ésser#Catalan" ] ] } ], "sounds": [ { "ipa": "[ˈsok]", "tags": [ "Balearic", "Central", "Valencia" ] } ], "word": "sóc" } { "categories": [ "Pages with 2 entries", "Pages with entries", "Sino-Vietnamese words", "Vietnamese entries with incorrect language header", "Vietnamese lemmas", "Vietnamese nouns", "Vietnamese nouns classified by con", "Vietnamese terms derived from Proto-Mon-Khmer", "Vietnamese terms derived from Proto-Vietic", "Vietnamese terms inherited from Proto-Mon-Khmer", "Vietnamese terms inherited from Proto-Vietic", "Vietnamese terms with IPA pronunciation", "vi:Calendar", "vi:Squirrels", "vi:Villages" ], "derived": [ { "word": "sóc chuột" } ], "etymology_number": 1, "etymology_templates": [ { "args": { "1": "vi", "2": "mkh-vie-pro", "3": "*prɔːk" }, "expansion": "Proto-Vietic *prɔːk", "name": "inh" }, { "args": { "1": "vi", "2": "mkh-pro", "3": "*prɔɔk" }, "expansion": "Proto-Mon-Khmer *prɔɔk", "name": "inh" }, { "args": { "1": "km", "2": "កំប្រុក" }, "expansion": "Khmer កំប្រុក (kɑmprok)", "name": "cog" }, { "args": { "1": "bdq", "2": "prok" }, "expansion": "Bahnar prok", "name": "cog" }, { "args": { "1": "kjg", "2": "-" }, "expansion": "Khmu", "name": "cog" } ], "etymology_text": "From Proto-Vietic *prɔːk, from Proto-Mon-Khmer *prɔɔk. Cognate with Khmer កំប្រុក (kɑmprok), Bahnar prok, Khmu [Cuang] pʰrɔːk.\nAttested as sóc in the Dictionarium Annamiticum Lusitanum et Latinum (1651).", "forms": [ { "form": "con", "tags": [ "classifier" ] }, { "form": "𱮗", "tags": [ "CJK" ] }, { "form": "朔", "tags": [ "CJK" ] } ], "head_templates": [ { "args": { "1": "vi", "2": "noun", "3": "", "4": "", "head": "", "tr": "𱮗, 朔" }, "expansion": "sóc • (𱮗, 朔)", "name": "head" }, { "args": { "1": "𱮗, 朔", "cls": "con" }, "expansion": "(classifier con) sóc • (𱮗, 朔)", "name": "vi-noun" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "noun", "senses": [ { "glosses": [ "squirrel (rodent)" ], "links": [ [ "squirrel", "squirrel" ] ] } ], "sounds": [ { "ipa": "[sawk͡p̚˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[ʂawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[sawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[ʂawk͡p̚˦˥]", "note": "Saigon" }, { "ipa": "[sawk͡p̚˦˥]", "note": "Saigon" } ], "word": "sóc" } { "categories": [ "Pages with 2 entries", "Pages with entries", "Sino-Vietnamese words", "Vietnamese entries with incorrect language header", "Vietnamese lemmas", "Vietnamese nouns", "Vietnamese terms with IPA pronunciation", "Vietnamese verbs", "vi:Calendar", "vi:Squirrels", "vi:Villages" ], "derived": [ { "word": "chăm sóc" }, { "word": "coi sóc" }, { "word": "săn sóc" } ], "etymology_number": 2, "forms": [ { "form": "朔", "tags": [ "CJK" ] } ], "head_templates": [ { "args": { "1": "vi", "2": "verb", "3": "", "4": "", "head": "", "tr": "朔" }, "expansion": "sóc • (朔)", "name": "head" }, { "args": { "1": "朔" }, "expansion": "sóc • (朔)", "name": "vi-verb" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "verb", "senses": [ { "glosses": [ "to take care of, to look after" ], "links": [ [ "take care", "take care" ], [ "look after", "look after" ] ], "raw_glosses": [ "(only in compounds) to take care of, to look after" ], "tags": [ "in-compounds" ] } ], "sounds": [ { "ipa": "[sawk͡p̚˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[ʂawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[sawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[ʂawk͡p̚˦˥]", "note": "Saigon" }, { "ipa": "[sawk͡p̚˦˥]", "note": "Saigon" } ], "word": "sóc" } { "categories": [ "Pages with 2 entries", "Pages with entries", "Sino-Vietnamese words", "Vietnamese entries with incorrect language header", "Vietnamese lemmas", "Vietnamese nouns", "Vietnamese terms borrowed from Khmer", "Vietnamese terms derived from Khmer", "Vietnamese terms with IPA pronunciation", "vi:Calendar", "vi:Squirrels", "vi:Villages" ], "derived": [ { "word": "Sóc Trăng" } ], "etymology_number": 3, "etymology_templates": [ { "args": { "1": "vi", "2": "km", "3": "ស្រុក" }, "expansion": "Khmer ស្រុក (srok)", "name": "bor" } ], "etymology_text": "From Khmer ស្រុក (srok).", "head_templates": [ { "args": { "1": "vi", "2": "noun", "3": "", "4": "", "head": "", "tr": "" }, "expansion": "sóc", "name": "head" }, { "args": {}, "expansion": "sóc", "name": "vi-noun" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "noun", "senses": [ { "glosses": [ "small Khmer village" ], "links": [ [ "small", "small" ], [ "Khmer", "Khmer" ], [ "village", "village" ] ] } ], "sounds": [ { "ipa": "[sawk͡p̚˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[ʂawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[sawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[ʂawk͡p̚˦˥]", "note": "Saigon" }, { "ipa": "[sawk͡p̚˦˥]", "note": "Saigon" } ], "word": "sóc" } { "categories": [ "Pages with 2 entries", "Pages with entries", "Sino-Vietnamese words", "Vietnamese entries with incorrect language header", "Vietnamese lemmas", "Vietnamese nouns", "Vietnamese terms with IPA pronunciation", "vi:Calendar", "vi:Squirrels", "vi:Villages" ], "derived": [ { "word": "ngày sóc" } ], "etymology_number": 4, "etymology_templates": [ { "args": { "1": "vi", "2": "朔" }, "expansion": "", "name": "etymid" }, { "args": { "1": "vi", "2": "Sino-Vietnamese words" }, "expansion": "", "name": "categorize" }, { "args": { "1": "朔" }, "expansion": "Sino-Vietnamese word from 朔", "name": "vi-etym-sino" } ], "etymology_text": "Sino-Vietnamese word from 朔.", "head_templates": [ { "args": { "1": "vi", "2": "noun", "3": "", "4": "", "head": "", "tr": "" }, "expansion": "sóc", "name": "head" }, { "args": {}, "expansion": "sóc", "name": "vi-noun" } ], "lang": "Vietnamese", "lang_code": "vi", "pos": "verb", "senses": [ { "glosses": [ "first day of the lunar month" ], "links": [ [ "first", "first" ], [ "day", "day" ], [ "lunar month", "lunar month" ] ] } ], "sounds": [ { "ipa": "[sawk͡p̚˧˦]", "tags": [ "Hà-Nội" ] }, { "ipa": "[ʂawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[sawk͡p̚˦˧˥]", "tags": [ "Huế" ] }, { "ipa": "[ʂawk͡p̚˦˥]", "note": "Saigon" }, { "ipa": "[sawk͡p̚˦˥]", "note": "Saigon" } ], "word": "sóc" }
Download raw JSONL data for sóc meaning in All languages combined (6.7kB)
This page is a part of the kaikki.org machine-readable All languages combined dictionary. This dictionary is based on structured data extracted on 2025-01-10 from the enwiktionary dump dated 2025-01-01 using wiktextract (df33d17 and 4ed51a5). The data shown on this site has been post-processed and various details (e.g., extra categories) removed, some information disambiguated, and additional data merged from other sources. See the raw data download page for the unprocessed wiktextract data.
If you use this data in academic research, please cite Tatu Ylonen: Wiktextract: Wiktionary as Machine-Readable Structured Data, Proceedings of the 13th Conference on Language Resources and Evaluation (LREC), pp. 1317-1325, Marseille, 20-25 June 2022. Linking to the relevant page(s) under https://kaikki.org would also be greatly appreciated.